ReverseSequence
对输入序列进行部分反转。
- 输入:
src - 需反转数据的地址
seq_lengths - 指定反转长度,为一维向量。
param - 算子计算所需参数的结构体。其各成员见下述。
core_mask - 核掩码。
ReverseSequenceParameter定义:
1typedef struct ReverseSequenceParameter {
2 int* shape_; // 输入和输出张量的形状
3 int* strides_; // 一个记录张量每一维步长的数组
4 int seq_dim_; // 指定反转的维度
5 int batch_dim_; // 指定切片维度
6 int ndim_; // 输入和输出张量的维度
7 int type_size_; // 输入和输出张量数据类型的长度
8 int copy_elem_num_; // 在inner_count循环中一次应被拷贝的元素数目
9 int outer_stride_; // 外层元素间的步长
10 int outer_count_; // 外层元素数
11 int inner_stride_; // 内层元素间的步长
12 int inner_count_; // 内层元素数
13} ReverseSequenceParameter;
- 输出:
dst - 输出地址。
- 支持平台:
FT78NEMT7004
备注
FT78NE 支持int8, int16, int32, fp32, fp64, cplx64, cplx128
MT7004 支持fp16, fp32, int16, int32, cplx64
共享/私有存储版本:
-
void anytype_reverse_sequence_anycore(void *src, void *dst, int *seq_lengths, ReverseSequenceParameter *param, int core_mask)
各种数据类型、私有及共享空间版本均使用该函数。对于不同数据类型,改变param中的type_size_参数即可。
C调用示例:
1void Resize(ReverseSequenceParameter* param) {
2 param->strides_ = (int*)0xA8020000;
3 ComputeStrides(param->shape_, param->strides_, param->ndim_);
4 int less_dim = param->batch_dim_ > param->seq_dim_ ? param->seq_dim_ : param->batch_dim_;
5 int greater_dim = param->batch_dim_ < param->seq_dim_ ? param->seq_dim_ : param->batch_dim_;
6 // calculate the size of elements should be copied at one time
7 param->copy_elem_num_ = CountElementAfterDim(param->shape_, greater_dim, param->ndim_);
8 // calculate the number of elements before the less axis and the stride
9 param->outer_count_ = CountElementBeforeDim(param->shape_, less_dim);
10 param->outer_stride_ = param->shape_[less_dim] * CountElementAfterDim(param->shape_, less_dim, param->ndim_);
11 // calculate the number of elements between the less axis and the greater axis and the stride
12 param->inner_count_ = 1;
13 int i;
14 for (i = less_dim + 1; i < greater_dim; i++) {
15 param->inner_count_ *= param->shape_[i];
16 }
17 param->inner_stride_ = param->shape_[greater_dim] * CountElementAfterDim(param->shape_, greater_dim, param->ndim_);
18}
19
20void TestReverseSequenceFp32(int* shape, int* orig_seq_lengths, int seq_dim, int batch_dim, int ndim, int core_mask) {
21 int core_id = get_core_id();
22 int core_num = GetCoreNum(core_mask);
23 int logic_core_id = GetLogicCoreId(core_mask, core_id);
24 float* input_data = (float*)0x88000000; // 测试私有空间时地址设置在私有空间内即可
25 float* output_data = (float*)0x98000000;
26 float* check = (float*)0xB8000000;
27 int* seq_lengths = (int*)0xC8000000;
28 ReverseSequenceParameter* param = (ReverseSequenceParameter*)0xA8000000;
29 int i;
30 if (logic_core_id == 0) {
31 param->shape_ = (int*)0xA8010000;
32 memcpy(param->shape_, shape, sizeof(int) * ndim);
33 memcpy(seq_lengths, orig_seq_lengths, sizeof(int) * shape[batch_dim]);
34 param->batch_dim_ = batch_dim;
35 param->seq_dim_ = seq_dim;
36 param->ndim_ = ndim;
37 param->type_size_ = sizeof(float);
38 Resize(param);
39 }
40 sys_bar(0, core_num); // 初始化参数完成后进行同步
41 anytype_reverse_sequence_anycore(input_data, output_data, seq_lengths, param, core_mask);
42}
43
44void main(){
45 int shape[3] = {3, 4, 10};
46 int seq_lengths[3] = {1, 2, 3};
47 int ndim = 3;
48 int seq_dim = 1;
49 int batch_dim = 0;
50 int core_mask = 0b1111; // 测试单核时核掩码设置为0b0001即可
51 TestReverseSequenceFp32(shape, seq_lengths, seq_dim, batch_dim, ndim, core_mask);
52}